#!/usr/bin/env python

#
# Licensed to the Apache Software Foundation (ASF) under one or more
# contributor license agreements.  See the NOTICE file distributed with
# this work for additional information regarding copyright ownership.
# The ASF licenses this file to You under the Apache License, Version 2.0
# (the "License"); you may not use this file except in compliance with
# the License.  You may obtain a copy of the License at
#
#    http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

# Script that updates verions for datafusion crates, locally
#
# dependencies:
# pip install tomlkit

import re
import argparse
from pathlib import Path
import tomlkit

crates = {
    "datafusion": "datafusion/core/Cargo.toml",
    "datafusion-cli": "datafusion-cli/Cargo.toml",
    "datafusion-common": "datafusion/common/Cargo.toml",
    "datafusion-data-access": "datafusion/data-access/Cargo.toml",
    "datafusion-expr": "datafusion/expr/Cargo.toml",
    "datafusion-jit": "datafusion/jit/Cargo.toml",
    "datafusion-physical-expr": "datafusion/physical-expr/Cargo.toml",
    "datafusion-proto": "datafusion/proto/Cargo.toml",
    "datafusion-row": "datafusion/row/Cargo.toml",
}

ballista_crates = {
    "ballista-cli": "ballista-cli/Cargo.toml",
    "core": "ballista/core/Cargo.toml",
    "client": "ballista/client/Cargo.toml",
    "executor": "ballista/executor/Cargo.toml",
    "scheduler": "ballista/scheduler/Cargo.toml",
}


def update_datafusion_version(cargo_toml: str, new_version: str):
    print(f"updating {cargo_toml}")
    with open(cargo_toml) as f:
        data = f.read()

    doc = tomlkit.parse(data)
    doc.get("package")["version"] = new_version

    with open(cargo_toml, "w") as f:
        f.write(tomlkit.dumps(doc))


def update_downstream_versions(cargo_toml: str, new_version: str):
    with open(cargo_toml) as f:
        data = f.read()

    doc = tomlkit.parse(data)

    for crate in crates.keys():
        df_dep = doc.get("dependencies", {}).get(crate)
        # skip crates that pin datafusion using git hash
        if df_dep is not None and df_dep.get("version") is not None:
            print(f"updating {crate} dependency in {cargo_toml}")
            df_dep["version"] = new_version

        df_dep = doc.get("dev-dependencies", {}).get(crate)
        if df_dep is not None and df_dep.get("version") is not None:
            print(f"updating {crate} dev-dependency in {cargo_toml}")
            df_dep["version"] = new_version

    with open(cargo_toml, "w") as f:
        f.write(tomlkit.dumps(doc))


def update_docs(path: str, new_version: str):
    print(f"updating docs in {path}")
    with open(path, "r+") as fd:
        content = fd.read()
        fd.seek(0)
        content = re.sub(
            r'datafusion = "(.+)"', f'datafusion = "{new_version}"', content
        )
        fd.write(content)


def main():
    parser = argparse.ArgumentParser(
        description=(
            "Update datafusion crate version and corresponding version pins "
            "in downstream crates."
        )
    )
    parser.add_argument("new_version", type=str, help="new datafusion version")
    args = parser.parse_args()

    new_version = args.new_version
    repo_root = Path(__file__).parent.parent.absolute()

    print(
        f"Updating datafusion crate versions in {repo_root} to {new_version}"
    )
    for cargo_toml in crates.values():
        update_datafusion_version(cargo_toml, new_version)

    print(
        f"Updating datafusion dependency versions in {repo_root} to {new_version}"
    )
    for cargo_toml in crates.values():
        update_downstream_versions(cargo_toml, new_version)
    for cargo_toml in ballista_crates.values():
        update_downstream_versions(cargo_toml, new_version)

    update_docs("README.md", new_version)


if __name__ == "__main__":
    main()
